import ollama

question = input("请输入问题：") or "20字介绍北京"

response = ollama.generate(
    model='qwen2.5:3b', 
    prompt=question,
    options={
        "temperature": 0.01,
        "top_p": 0.7,
        "max_tokens": 200       
    }
    )

answer  = response.response

print("问:",question,"?\n答:", answer)